tableName:github_projects
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive
inputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat
outputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:2
totalFileSize:2043645651
maxFileSize:2043645374
minFileSize:277
lastAccessTime:0
lastUpdateTime:1455974890000

before:
tableName:github_projects_asnappy
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_asnappy
inputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat
outputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:199
totalFileSize:2135894040
maxFileSize:16810864
minFileSize:10615104
lastAccessTime:0
lastUpdateTime:1455966332000

SET hive.exec.compress.output=true;
SET mapred.output.compression.type=BLOCK;
SET mapred.output.compression.codec=org.apache.hadoop.io.compress.SnappyCodec;
set hadoop.tmp.dir=/mnt/data/home/mdupont/oel/data/github/hive/temp;
set hive.metastore.warehouse.dir=/mnt/data/home/mdupont/oel/data/github/hive/;
SET dfs.block.size=10240000;  
SET parquet.block.size=10240000;
SET hive.exec.reducers.bytes.per.reducer=10240000;
SET hive.merge.mapfiles=true;
SET hive.merge.size.per.task=10240000;
SET hive.merge.smallfiles.avgsize=10240000;
SET mapred.max.split.size=10240000;
INSERT OVERWRITE TABLE github_projects_asnappy SELECT * FROM github_projects_asnappy;

Afterwards :
tableName:github_projects_asnappy
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_asnappy
inputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat
outputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:66
totalFileSize:742289940
maxFileSize:20089860
minFileSize:10219088
lastAccessTime:0
lastUpdateTime:1455977735000


tableName:github_projects_az
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_az
inputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat
outputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:199
totalFileSize:2135893045
maxFileSize:16810859
minFileSize:10615099
lastAccessTime:0
lastUpdateTime:1455935348000

tableName:github_projects_az2
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_az2
inputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat
outputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:199
totalFileSize:2135893244
maxFileSize:16810860
minFileSize:10615100
lastAccessTime:0
lastUpdateTime:1455964350000

tableName:github_projects_az3
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_az3
inputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat
outputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:67
totalFileSize:742307235
maxFileSize:13416052
minFileSize:3822060
lastAccessTime:0
lastUpdateTime:1455964955000

tableName:github_projects_az4
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_az4
inputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerInputFormat
outputformat:org.apache.hadoop.hive.ql.io.avro.AvroContainerOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:199
totalFileSize:2135893244
maxFileSize:16810860
minFileSize:10615100
lastAccessTime:0
lastUpdateTime:1455965287000















tableName:github_projects_pgz
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_pgz
inputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat
outputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:67
totalFileSize:902523166
maxFileSize:13993256
minFileSize:9044963
lastAccessTime:0
lastUpdateTime:1455933960000

tableName:github_projects_ps
archive.org:OelGithubProjectsParquetSnappy
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_ps
inputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat
outputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:597
totalFileSize:4406505316
maxFileSize:16645387
minFileSize:3926751
lastAccessTime:0
lastUpdateTime:1455931502000

tableName:github_projects_ps2
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_ps2
inputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat
outputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:1
totalFileSize:14799512
maxFileSize:14799512
minFileSize:14799512
lastAccessTime:0
lastUpdateTime:1455882346000

tableName:github_projects_ps3
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_ps3
inputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat
outputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:1
totalFileSize:15450
maxFileSize:15450
minFileSize:15450
lastAccessTime:0
lastUpdateTime:1455883550000

tableName:github_projects_ps4
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_ps4
inputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat
outputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat
columns:struct columns { i32 id, string owner_type, string name, string description, string full_name, string owner_name, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:1
totalFileSize:15347
maxFileSize:15347
minFileSize:15347
lastAccessTime:0
lastUpdateTime:1455883924000

tableName:github_projects_pssn
ARCHIVE.ORG:oel_github_projects_snappy_hive
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_pssn
inputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat
outputformat:org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:100
totalFileSize:1417888955
maxFileSize:14625414
minFileSize:11271128
lastAccessTime:0
lastUpdateTime:1455932360000




TEXT


tableName:github_projects_t
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_t
inputformat:org.apache.hadoop.mapred.TextInputFormat
outputformat:org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:398
totalFileSize:2823081536
maxFileSize:16943171
minFileSize:2879187
lastAccessTime:0
lastUpdateTime:1455935970000

tableName:github_projects_i
owner:mdupont
location:file:/mnt/data/home/mdupont/oel/data/github/hive/github_projects_i
inputformat:org.apache.hadoop.mapred.TextInputFormat
outputformat:org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
columns:struct columns { i32 id, bool fork, string name, string description, string full_name, string owner_name, string owner_type, string html_url}
partitioned:false
partitionColumns:
totalNumberFiles:7
totalFileSize:2152276311
maxFileSize:534169493
minFileSize:269407793
lastAccessTime:0
lastUpdateTime:1455794982000
